# encoding: utf-8

from tqdm import tqdm
path = "G:/baiduyunDownload/563w_baidubaike.json/563w_baidubaike.json"
# path = "D:/data/pretrain_datas/563w_baidubaike.json"
idx = 0
with open(path, "r", encoding="utf-8") as f:
    with open("./demo.json", "w", encoding="utf-8") as ff:
        for line in f:
            ff.write(line)
            idx += 1
            if idx % 100 == 0:
                break
